import pdfplumber

# 提取第一页信息
# with pdfplumber.open("Baichuan 2 Open Large-scale Language Models.pdf") as pdf:
#     first_page = pdf.pages[0]
#     print(first_page.extract_text())

# 提取第三页的表格
# with pdfplumber.open("Baichuan 2 Open Large-scale Language Models.pdf") as pdf:
#     table = pdf.pages[2].extract_table()
#     for row in table:
#         print(row)

# 提取第三页的图片
with pdfplumber.open("Baichuan 2 Open Large-scale Language Models.pdf") as pdf:
    images = pdf.pages[2].images
    for image in images:
        print(image)